#!/usr/bin/python
#  -*- coding:utf-8 -*-

from bs4 import BeautifulSoup
from urllib import urlopen

soup1 = BeautifulSoup("<html></html>")

soup3 = BeautifulSoup(urlopen("http://www.baidu.com/"),'html5lib')

text = soup3.get_text()
print text

